# coding=gbk
import re

def parse_one_page(html):
    ret = []
    get_rank = re.compile(r"\d+(?=</i>)")
    get_source = re.compile(r"(?<=data\-src=\")\S+(?=\")")
    get_title = re.compile(r"(?<=title=\")\S+(?=\")")
    get_star = re.compile(r"(?<=<p class=\"star\">\n)\s*\S*")
    get_time = re.compile(r"(?<=<p class=\"releasetime\">)\S+(?=</p>)")
    get_num1 = re.compile(r"(?<=<i class=\"integer\">)\d.(?=</i>)")
    get_num2 = re.compile(r"(?<=<i class=\"fraction\">)\d(?=</i>)")
    ret.append(get_rank.findall(html)[0])
    ret.append(get_source.findall(html)[0])
    ret.append(get_title.findall(html)[0])
    ret.append(get_star.findall(html)[0].replace(" ",""))
    ret.append(get_time.findall(html)[0])
    ret.append(get_num1.findall(html)[0])
    ret.append(get_num2.findall(html)[0])
    result = []
    result.append(tuple(ret))
    print(result)


with open("7-6-3.html","r",encoding="utf8") as f:
    parse_one_page(f.read())